import numpy as np
import pickle

# 生成模拟数据
np.random.seed(42)
num_samples = 1000
embedding_dim = 128

# 生成图像embeddings
image_embeddings = np.random.randn(num_samples, embedding_dim)

# 生成文本embeddings
text_embeddings = np.random.randn(num_samples, embedding_dim)

# 将图像和文本embeddings配对
data = list(zip(image_embeddings, text_embeddings))

# 存储数据到当前文件夹
with open('src/model_pth/data.pkl', 'wb') as f:
    pickle.dump(data, f)